# -*- coding: utf-8 -*-

# pip install beautifulsoup4
from bs4 import BeautifulSoup


def demo():
    content = """
        <html><head><title>The Dormouse's story</title></head>
        <body>
        <p class="title"><b>The Dormouse's story</b></p>

        <p class="story">Once upon a time there were three little sisters; and their names were
        <a href="http://example.com/elsie" class="sister" id="link1">Elsie</a>,
        <a href="http://example.com/lacie" class="sister" id="link2">Lacie</a> and
        <a href="http://example.com/tillie" class="sister" id="link3">Tillie</a>;
        and they lived at the bottom of a well.</p>

        <p class="story">...</p>
        """
    # pip install html5lib
    bs = BeautifulSoup(markup=content, features="html5lib")

    # 格式化
    # print(bs.prettify())

    # 标题
    print(bs.title.string)
    pass


if __name__ == '__main__':
    demo()
    pass
